通过JAVA获取优酷、土豆、酷6、6间房等视频

通过JAVA获取优酷、土豆、酷6、6间房、56视频,现在很多社会网站都有这个功能,用户输入优酷、土豆、酷6、6间房、56视频地址后,能找到对应的视频及视频的缩略图,有些社区网站还能获取到视频的时长。
比如:新浪微博就有这个功能,当用户输入优酷、土豆、酷6、6间房、56视频网址后,就能获取到相应的视频地址及视频的缩略图。

其中要用到一个JAR包,链接地址如下:
http://jsoup.org/packages/jsoup-1.5.2.jar



import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.select.Elements;

/**
* 视频工具类
* @author sunlightcs
* 2011-4-6
* http://hi.juziku.com/sunlightcs/
*/
public class VideoUtil {

/**
  * 获取视频信息
  * @param url
  * @return
  */
public static Video getVideoInfo(String url){
  Video video = new Video();
 
  if(url.indexOf("v.youku.com")!=-1){
   try {
    video = getYouKuVideo(url);
   } catch (Exception e) {
    video = null;
   }
  }else if(url.indexOf("tudou.com")!=-1){
   try {
    video = getTudouVideo(url);
   } catch (Exception e) {
    video = null;
   }
  }else if(url.indexOf("v.ku6.com")!=-1){
   try {
    video = getKu6Video(url);
   } catch (Exception e) {
    video = null;
   }
  }else if(url.indexOf("6.cn")!=-1){
   try {
    video = get6Video(url);
   } catch (Exception e) {
    video = null;
   }
  }else if(url.indexOf("56.com")!=-1){
   try {
    video = get56Video(url);
   } catch (Exception e) {
    video = null;
   }
  }
 
  return video;
}


/**
  * 获取优酷视频
  * @param url 视频URL
  */
public static Video getYouKuVideo(String url) throws Exception{
  Document doc = getURLContent(url);
 
  /**
   *获取视频缩略图
   */
  String pic = getElementAttrById(doc, "s_sina", "href");
  int local = pic.indexOf("pic=");
  pic = pic.substring(local+4);
 
  /**
   * 获取视频地址
   */ 
  String flash = getElementAttrById(doc, "link2", "value");
 
  /**
   * 获取视频时间
   */
  String time = getElementAttrById(doc, "download", "href");
  String []arrays = time.split("\\|");
  time = arrays[4];
 
  Video video = new Video();
  video.setPic(pic);
  video.setFlash(flash);
  video.setTime(time);
 
  return video;
}


/**
  * 获取土豆视频
  * @param url 视频URL
  */
public static Video getTudouVideo(String url) throws Exception{
  Document doc = getURLContent(url);
  String content = doc.html();
  int beginLocal = content.indexOf("<script>document.domain");
  int endLocal = content.indexOf("</script>");
  content = content.substring(beginLocal, endLocal);
 
  /**
   * 获取视频地址
   */
  String flash = getScriptVarByName("iid_code", content);
  flash = "http://www.tudou.com/v/" + flash + "/v.swf";
 
  /**
   *获取视频缩略图
   */
  String pic = getScriptVarByName("thumbnail", content);
 
  /**
   * 获取视频时间
   */
  String time = getScriptVarByName("time", content);

  Video video = new Video();
  video.setPic(pic);
  video.setFlash(flash);
  video.setTime(time);
 
  return video;
}


/**
  * 获取酷6视频
  * @param url 视频URL
  */
public static Video getKu6Video(String url) throws Exception{
  Document doc = getURLContent(url);
 
  /**
   * 获取视频地址
   */
  Element flashEt = doc.getElementById("outSideSwfCode");
  String flash = flashEt.attr("value");
 
  /**
   * 获取视频缩略图
   */
  Element picEt = doc.getElementById("plVideosList");
  String time = null;
  String pic = null;
  if(picEt!=null){
   Elements pics = picEt.getElementsByTag("img");
   pic = pics.get(0).attr("src");
  
   /**
    * 获取视频时长
    */
   Element timeEt = picEt.select("span.review>cite").first();
   time = timeEt.text();
  }else{
   pic = doc.getElementsByClass("s_pic").first().text();
  }
 
  Video video = new Video();
  video.setPic(pic);
  video.setFlash(flash);
  video.setTime(time);
 
  return video;
 
}


/**
  * 获取6间房视频
  * @param url 视频URL
  */
public static Video get6Video(String url) throws Exception{
  Document doc = getURLContent(url);
 
  /**
   * 获取视频缩略图
   */
  Element picEt = doc.getElementsByClass("summary").first();
  String pic = picEt.getElementsByTag("img").first().attr("src");
 
  /**
   * 获取视频时长
   */
  String time = getVideoTime(doc, url, "watchUserVideo");
  if(time==null){
   time = getVideoTime(doc, url, "watchRelVideo");
  }
 
  /**
   * 获取视频地址
   */
  Element flashEt = doc.getElementById("video-share-code");
  doc = Jsoup.parse(flashEt.attr("value")); 
  String flash = doc.select("embed").attr("src");
 
  Video video = new Video();
  video.setPic(pic);
  video.setFlash(flash);
  video.setTime(time);
 
  return video;
}


/**
  * 获取56视频
  * @param url 视频URL
  */
public static Video get56Video(String url) throws Exception{
  Document doc = getURLContent(url);
  String content = doc.html();
 
  /**
   * 获取视频缩略图
   */
  int begin = content.indexOf("\"img\":\"");
  content = content.substring(begin+7, begin+200);
  int end = content.indexOf("\"};");
  String pic = content.substring(0, end).trim();
  pic = pic.replaceAll("\\\\", ""); 
 
  /**
   * 获取视频地址
   */
  String flash = "http://player.56.com" + url.substring(url.lastIndexOf("/"), url.lastIndexOf(".html")) + ".swf";
 
  Video video = new Video();
  video.setPic(pic);
  video.setFlash(flash);
 
  return video;
}

/**
  * 获取6间房视频时长   
  */
private static String getVideoTime(Document doc, String url, String id) {
  String time = null;
 
  Element timeEt = doc.getElementById(id);
  Elements links = timeEt.select("dt > a");
 
 
  for (Element link : links) {
    String linkHref = link.attr("href");
    if(linkHref.equalsIgnoreCase(url)){
     time = link.parent().getElementsByTag("em").first().text();
     break;
    }
  }
  return time;
}

  
/**
  * 获取script某个变量的值
  * @param name 变量名称
  * @return 返回获取的值
  */
private static String getScriptVarByName(String name, String content){
  String script = content;
 
  int begin = script.indexOf(name);
 
  script = script.substring(begin+name.length()+2);
 
  int end = script.indexOf(",");
 
  script = script.substring(0,end);
 
  String result=script.replaceAll("'", "");
  result = result.trim();
 
  return result;
}


/**
  * 根据HTML的ID键及属于名,获取属于值
  * @param id HTML的ID键
  * @param attrName 属于名
  * @return 返回属性值
  */
private static String getElementAttrById(Document doc, String id, String attrName)throws Exception{
  Element et = doc.getElementById(id);
  String attrValue = et.attr(attrName);
 
  return attrValue;
}



/**
  * 获取网页的内容
  */
private static Document getURLContent(String url) throws Exception{
  Document doc = Jsoup.connect(url)
    .data("query", "Java")
    .userAgent("Mozilla")
    .cookie("auth", "token")
    .timeout(6000)
    .post();
  return doc;
}


public static void main(String[] args) {
  //String url = "http://v.youku.com/v_show/id_XMjU0MjI2NzY0.html";
  //String url = "http://www.tudou.com/programs/view/pVploWOtCQM/";
  //String url = "http://v.ku6.com/special/show_4024167/9t7p64bisV2A31Hz.html";
  //String url = "http://v.ku6.com/show/BpP5LeyVwvikbT1F.html";
  //String url = "http://6.cn/watch/14757577.html";
  String url = "http://www.56.com/u64/v_NTkzMDEzMTc.html";
  Video video = getVideoInfo(url);
  System.out.println("视频缩略图:"+video.getPic());
  System.out.println("视频地址:"+video.getFlash());
  System.out.println("视频时长:"+video.getTime());
}
}


/**
* 视频封装
* @author sunlightcs
* 2011-4-6
* http://hi.juziku.com/sunlightcs/
*/
public class Video {
private String flash;
private String pic;
private String time;
public String getFlash() {
  return flash;
}
public void setFlash(String flash) {
  this.flash = flash;
}
public String getPic() {
  return pic;
}
public void setPic(String pic) {
  this.pic = pic;
}
public String getTime() {
  return time;
}
public void setTime(String time) {
  this.time = time;
}
}

你可能感兴趣的:(java)