1. 程式人生 > >java扒頁面代碼

java扒頁面代碼

buffer follow http string read puts class utf utf-8

import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.FileWriter;
import java.io.InputStreamReader;
import java.io.OutputStreamWriter;
import java.io.FileOutputStream;
import java.net.URL;

public class Test2{
public static void main(String[] args)throws Exception{
URL url = new URL("https://www.baidu.com");

BufferedReader reader = new BufferedReader(new InputStreamReader(url.openStream(),"utf-8"));
BufferedWriter writer = new BufferedWriter(new OutputStreamWriter(new FileOutputStream("d:/code/data.html"),"utf-8"));
String line;
while((line = reader.readLine()) != null){
System.out.println(line);
writer.write(line);
writer.newLine();
}
reader.close();
writer.close();
}
}

java扒頁面代碼