根据 URL 地址获取其页面的 HTML 文本的 Java 源码

import java.net.*;
import java.io.*;

/**
 * HTML工具类
 * @author MIKUScallion
 *
 */
public class Html {
 private static URL url;
 private static URLConnection cnet;
 private static InputStream is;
 private static BufferedInputStream bis;
 private static StringBuilder sb;
 private static String result;
 /**
  * 输入url地址获得页面的HTML代码
  * @param url  url地址
  * @return       大String(HTML代码)
  * @throws IOException
  */
 public  static String getHtmlCode(String str){
  try {
   url = new URL(str);
      cnet =url.openConnection();
   is =cnet.getInputStream();
   bis =new BufferedInputStream(is);
   byte [] bytes =new byte[512];
   int len =-1;
   sb =new StringBuilder();
   while((len=bis.read(bytes))!=-1){
    sb.append(new String(bytes,0,len));
   }
   is.close();
   bis.close();
   result=sb.toString();
   return result;
  } catch (MalformedURLException e) {
   e.printStackTrace();
  } catch (IOException e) {
   e.printStackTrace();
  }
  return null;
 }
}

PS: TIME MAGIC 系列文章年代久远,无法保证其完全正确性。

封面图来自:砂時計

文章来源:

Author:大刀分享站-dddog.com.cn
link:https://www.dddog.com.cn/tutorial/time-magic-1/