• Jsoup视频信息


    import java.io.IOException;
    import java.util.ArrayList;
    import java.util.HashMap;
    import java.util.List;
    import java.util.Map;
    
    import org.jsoup.Jsoup;
    import org.jsoup.nodes.Document;
    import org.jsoup.nodes.Element;
    import org.jsoup.select.Elements;
    
    public class TencentVideo {
        
        public static void getTencentVideoName(String url) {
            List<Map<String,String>> resultList = new ArrayList<Map<String,String>>();
            Document document = null;
            int pageSize = 30;
            int index = 1;
            try {
                for(int i = 0 ; i < 167; i ++) {
                    String urlget =  url + (i*pageSize);
                    Thread.sleep(1000);
                    System.out.println("URL:" + urlget.toString());
                    document = Jsoup.connect(urlget).userAgent("Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/52.0.2743.116 Safari/537.36")
                            //加上cookie信息
                            .cookie("auth", "token")
                            //设置超时
                            .timeout(30000)
                            //用get()方式请求网址,也可以post()方式
                            .get();
                    Elements elements = document.select("li.list_item");
                    if(elements == null || "".equals(elements.toString())) {
                        break;
                    }
                    for (Element ele : elements) {
                        Map<String,String> obj = new HashMap<String,String>();
                        Elements name = ele.select("strong.figure_title");
                        String nameStr = name.select("a").attr("title");
                        String leader  = ele.select("div.figure_desc").text();
                        String count  = ele.select("div.figure_count").text();
                        String remark = ele.select("span.figure_info").text();
                        String score = ele.select("div.figure_score").text();
                        System.out.println("================== " + index + " =====================");
                        System.out.println("名称:" + nameStr.toString());
                        System.out.println("主演:" + leader.toString());
                        System.out.println("评分:" + score.toString());
                        System.out.println("描述:" + remark.toString());
                        System.out.println("点播量:" + count.toString());
                        obj.put("name", nameStr);
                        obj.put("lead", leader);
                        obj.put("desc", remark);
                        obj.put("score", score);
                        obj.put("dianbo", count);
                        resultList.add(obj);
                        index ++;
                    }
                }
                new ExportExcel().exportTencentExcle(resultList);
            } catch (IOException e) {
                e.printStackTrace();
            }catch (Exception ae) {
                ae.printStackTrace();
            }
             
        }
        
        public static void main(String[] args) {
            //电影
            //getTencentVideoName("http://v.qq.com/x/list/movie?itype=-1&offset=");
            //电视剧
    //        getTencentVideoName("http://v.qq.com/x/list/tv?feature=-1&offset=");
            //动漫
    //        getTencentVideoName("http://v.qq.com/x/list/cartoon?itype=-1&offset=");
            //少儿 
    //        getTencentVideoName("http://v.qq.com/x/list/child?iarea=-1&offset=");
            //综艺
    //        getTencentVideoName("http://v.qq.com/x/list/variety?exclusive=-1&offset=");
            //演唱会
    //        getTencentVideoName("http://v.qq.com/x/list/music?istate=2&offset=");
            //纪录片
    //        getTencentVideoName("http://v.qq.com/x/list/doco?itrailer=-1&offset=");
            //电影独播
    //        getTencentVideoName("https://v.qq.com/x/list/movie?characteristic=5&offset=");
            //电视剧独播
            getTencentVideoName("https://v.qq.com/x/list/tv?feature=44&offset=");
        }
    }
  • 相关阅读:
    (算法)Hanoi Problem汉诺塔问题
    (剑指Offer)面试题48:不能被继承的类
    (剑指Offer)面试题47:不用加减乘除做加法
    (剑指Offer)面试题46:求1+2+3+....+n
    (剑指Offer)面试题45:圆圈中最后剩下的数字
    程序员应该知道的15件事 在生活与工作中用他们来警惕自己
    基于REST架构的Web Service设计
    互联网上五个最高级的搜索引擎
    哈佛经济学家关于工作效率的意外发现
    列举一些常见的系统系能瓶颈 Common Bottlenecks
  • 原文地址:https://www.cnblogs.com/julian-chang/p/11818397.html
Copyright © 2020-2023  润新知