• Java实现一个简单的网络爬虫


    Java实现一个简单的网络爬虫

     1 import java.io.BufferedReader;
     2 import java.io.BufferedWriter;
     3 import java.io.FileWriter;
     4 import java.io.IOException;
     5 import java.io.InputStream;
     6 import java.io.InputStreamReader;
     7 import java.net.MalformedURLException;
     8 import java.net.URL;
     9 
    10 
    11 public class BasicSpaider {
    12 
    13     public static void main(String[] args) {
    14     URL url = null;
    15     InputStream is = null;
    16     BufferedReader br = null;
    17     FileWriter fw = null;
    18     BufferedWriter bw = null;
    19     String temp = null;
    20     StringBuilder sb = new StringBuilder();
    21     try {
    22         fw = new FileWriter("C:/Users/Xiaofei/Desktop/163首页.txt",true); 
    23         bw = new BufferedWriter(fw);
    24         url = new URL("http://www.163.com");
    25         is = url.openStream();
    26         br = new BufferedReader(new InputStreamReader(is,"GBK"));
    27         while((temp = br.readLine())!=null){
    28             bw.write(temp);
    29             sb.append(temp);
    30         }
    31         System.out.println(sb+"/n完成");
    32     } catch (MalformedURLException e) {
    33         // TODO 自动生成的 catch 块
    34         e.printStackTrace();
    35     } catch (IOException e) {
    36         // TODO 自动生成的 catch 块
    37         e.printStackTrace();
    38     }finally{
    39         try {
    40             bw.close();
    41             fw.close();
    42             br.close();
    43             is.close();
    44         } catch (IOException e) {
    45             // TODO 自动生成的 catch 块
    46             e.printStackTrace();
    47         }
    48     }
    49 
    50     }
    51 
    52 }
  • 相关阅读:
    pip安装
    nfs
    源码方式安装软件
    自启动
    multipath
    linux永久添加和删除路由
    iscsi
    linux识别workstation磁盘的uuid
    centos镜像各种cd,dvd版本区别
    转:C# 中 MSCHART 饼状图显示百分比
  • 原文地址:https://www.cnblogs.com/rememberme/p/BasicSpaider.html
Copyright © 2020-2023  润新知