通过JAVA获取优酷、土豆、酷6、6间房、56视频,现在很多社会网站都有这个功能,用户输入优酷、土豆、酷6、6间房、56视频地址后,能找到对应的视频及视频的缩略图,有些社区网站还能获取到视频的时长。
比如:新浪微博就有这个功能,当用户输入优酷、土豆、酷6、6间房、56视频网址后,就能获取到相应的视频地址及视频的缩略图。
其中要用到一个JAR包,链接地址如下:
http://jsoup.org/packages/jsoup-1.5.2.jar
原文地址:http://www.juziku.com/wiki/906.htm
核心代码:
import org.jsoup.Jsoup; import org.jsoup.nodes.Document; import org.jsoup.nodes.Element; import org.jsoup.select.Elements; /** * 视频工具类 * http://hi.juziku.com/sunlightcs/ */ public class VideoUtil { /** * 获取视频信息 * @param url * @return */ public static Video getVideoInfo(String url){ Video video = new Video(); if(url.indexOf("v.youku.com")!=-1){ try { video = getYouKuVideo(url); } catch (Exception e) { video = null; } }else if(url.indexOf("tudou.com")!=-1){ try { video = getTudouVideo(url); } catch (Exception e) { video = null; } }else if(url.indexOf("v.ku6.com")!=-1){ try { video = getKu6Video(url); } catch (Exception e) { video = null; } }else if(url.indexOf("6.cn")!=-1){ try { video = get6Video(url); } catch (Exception e) { video = null; } }else if(url.indexOf("56.com")!=-1){ try { video = get56Video(url); } catch (Exception e) { video = null; } } return video; } /** * 获取优酷视频 * @param url 视频URL */ public static Video getYouKuVideo(String url) throws Exception{ Document doc = getURLContent(url); /** *获取视频缩略图 */ String pic = getElementAttrById(doc, "s_sina", "href"); int local = pic.indexOf("pic="); pic = pic.substring(local+4); /** * 获取视频地址 */ String flash = getElementAttrById(doc, "link2", "value"); /** * 获取视频时间 */ String time = getElementAttrById(doc, "download", "href"); String []arrays = time.split("\\|"); time = arrays[4]; Video video = new Video(); video.setPic(pic); video.setFlash(flash); video.setTime(time); return video; } /** * 获取土豆视频 * @param url 视频URL */ public static Video getTudouVideo(String url) throws Exception{ Document doc = getURLContent(url); String content = doc.html(); int beginLocal = content.indexOf("<script>document.domain"); int endLocal = content.indexOf("</script>"); content = content.substring(beginLocal, endLocal); /** * 获取视频地址 */ String flash = getScriptVarByName("iid_code", content); flash = "http://www.tudou.com/v/" + flash + "/v.swf"; /** *获取视频缩略图 */ String pic = getScriptVarByName("thumbnail", content); /** * 获取视频时间 */ String time = getScriptVarByName("time", content); Video video = new Video(); video.setPic(pic); video.setFlash(flash); video.setTime(time); return video; } /** * 获取酷6视频 * @param url 视频URL */ public static Video getKu6Video(String url) throws Exception{ Document doc = getURLContent(url); /** * 获取视频地址 */ Element flashEt = doc.getElementById("outSideSwfCode"); String flash = flashEt.attr("value"); /** * 获取视频缩略图 */ Element picEt = doc.getElementById("plVideosList"); String time = null; String pic = null; if(picEt!=null){ Elements pics = picEt.getElementsByTag("img"); pic = pics.get(0).attr("src"); /** * 获取视频时长 */ Element timeEt = picEt.select("span.review>cite").first(); time = timeEt.text(); }else{ pic = doc.getElementsByClass("s_pic").first().text(); } Video video = new Video(); video.setPic(pic); video.setFlash(flash); video.setTime(time); return video; } /** * 获取6间房视频 * @param url 视频URL */ public static Video get6Video(String url) throws Exception{ Document doc = getURLContent(url); /** * 获取视频缩略图 */ Element picEt = doc.getElementsByClass("summary").first(); String pic = picEt.getElementsByTag("img").first().attr("src"); /** * 获取视频时长 */ String time = getVideoTime(doc, url, "watchUserVideo"); if(time==null){ time = getVideoTime(doc, url, "watchRelVideo"); } /** * 获取视频地址 */ Element flashEt = doc.getElementById("video-share-code"); doc = Jsoup.parse(flashEt.attr("value")); String flash = doc.select("embed").attr("src"); Video video = new Video(); video.setPic(pic); video.setFlash(flash); video.setTime(time); return video; } /** * 获取56视频 * @param url 视频URL */ public static Video get56Video(String url) throws Exception{ Document doc = getURLContent(url); String content = doc.html(); /** * 获取视频缩略图 */ int begin = content.indexOf("\"img\":\""); content = content.substring(begin+7, begin+200); int end = content.indexOf("\"};"); String pic = content.substring(0, end).trim(); pic = pic.replaceAll("\\\\", ""); /** * 获取视频地址 */ String flash = "http://player.56.com" + url.substring(url.lastIndexOf("/"), url.lastIndexOf(".html")) + ".swf"; Video video = new Video(); video.setPic(pic); video.setFlash(flash); return video; } /** * 获取6间房视频时长 */ private static String getVideoTime(Document doc, String url, String id) { String time = null; Element timeEt = doc.getElementById(id); Elements links = timeEt.select("dt > a"); for (Element link : links) { String linkHref = link.attr("href"); if(linkHref.equalsIgnoreCase(url)){ time = link.parent().getElementsByTag("em").first().text(); break; } } return time; } /** * 获取script某个变量的值 * @param name 变量名称 * @return 返回获取的值 */ private static String getScriptVarByName(String name, String content){ String script = content; int begin = script.indexOf(name); script = script.substring(begin+name.length()+2); int end = script.indexOf(","); script = script.substring(0,end); String result=script.replaceAll("'", ""); result = result.trim(); return result; } /** * 根据HTML的ID键及属于名,获取属于值 * @param id HTML的ID键 * @param attrName 属于名 * @return 返回属性值 */ private static String getElementAttrById(Document doc, String id, String attrName)throws Exception{ Element et = doc.getElementById(id); String attrValue = et.attr(attrName); return attrValue; } /** * 获取网页的内容 */ private static Document getURLContent(String url) throws Exception{ Document doc = Jsoup.connect(url) .data("query", "Java") .userAgent("Mozilla") .cookie("auth", "token") .timeout(6000) .post(); return doc; } public static void main(String[] args) { //String url = "http://v.youku.com/v_show/id_XMjU0MjI2NzY0.html"; //String url = "http://www.tudou.com/programs/view/pVploWOtCQM/"; //String url = "http://v.ku6.com/special/show_4024167/9t7p64bisV2A31Hz.html"; //String url = "http://v.ku6.com/show/BpP5LeyVwvikbT1F.html"; //String url = "http://6.cn/watch/14757577.html"; String url = "http://www.56.com/u64/v_NTkzMDEzMTc.html"; Video video = getVideoInfo(url); System.out.println("视频缩略图:"+video.getPic()); System.out.println("视频地址:"+video.getFlash()); System.out.println("视频时长:"+video.getTime()); } }
视频封装类:
/** * 视频封装 * http://hi.juziku.com/sunlightcs/ */ public class Video { private String flash; private String pic; private String time; public String getFlash() { return flash; } public void setFlash(String flash) { this.flash = flash; } public String getPic() { return pic; } public void setPic(String pic) { this.pic = pic; } public String getTime() { return time; } public void setTime(String time) { this.time = time; } }