日期:2014-05-17  浏览次数:20713 次

保存html源文件到txt
import java.io.BufferedReader;
import java.io.FileNotFoundException;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.InputStreamReader;
import java.net.MalformedURLException;
import java.net.URL;

public class ReadUrlToTxt {
	private URL url = null;

	public ReadUrlToTxt() {
		try {
			init();
		} catch (IOException e) {
			// TODO Auto-generated catch block
			e.printStackTrace();
		}
	}

	private void init() throws IOException {
		java.util.Scanner sc = new java.util.Scanner(System.in);
		System.out.println("please enter a url");
		String strUrl = sc.next();
		try {
			url = new URL(strUrl);
		} catch (MalformedURLException e) {
			// TODO Auto-generated catch block
			e.printStackTrace();
		}
		BufferedReader input = new BufferedReader(new InputStreamReader(url
				.openStream()));
		saveHtmlToTxt(input);

	}

	private void saveHtmlToTxt(BufferedReader input) {
		java.util.Scanner sc = new java.util.Scanner(System.in);
		String str;
		String path;
		System.out.println("please enter the file path you want to save");
		path = sc.next();
		FileOutputStream output = null;
		try {
			output = new FileOutputStream(path);
		} catch (FileNotFoundException e1) {
			// TODO Auto-generated catch block
			e1.printStackTrace();
		}
		try {
			while ((str = input.readLine()) != null) {
				byte[] byteStr = str.getBytes();
				output.write(byteStr);

			}
		} catch (IOException e) {
			// TODO Auto-generated catch block
			e.printStackTrace();
		} finally {
			try {
				output.close();
			} catch (IOException e) {
				// TODO Auto-generated catch block
				e.printStackTrace();
			}
		}

	}

	/**
	 * @param args
	 */
	public static void main(String[] args) {
		// TODO Auto-generated method stub
		new ReadUrlToTxt();

	}

}