这是一个从网页源文件中得到链接的实现代码,和大家分享一下:
import Java.net.*; import Java.io.*; import Java.util.*;
class ScanPage{ private static String strPage; private String strUrl; private String fileName; public void setURL(String strUrl){ this.strUrl=strUrl; } //从地址中得到文件名 public void setFileName(){ int i; char ch; i=strUrl.length(); ch=strUrl.charAt(--i); while(ch!=’/’ && ch>0) ch=strUrl.charAt(--i); fileName=strUrl.substring(i); } //下载网页 public void downFile()throws IOException{ URL url =new URL(strUrl); InputStream is =url.openStream(); OutputStream os =new FileOutputStream(fileName); byte[] buffer =new byte[512]; int len; while((len =is.read(buffer))!=-1) os.write(buffer,0,len); is.close(); os.close(); } //读文件 public void readFile() throws IOException { StringBuffer sb = new StringBuffer(); BufferedReader in =new BufferedReader(new FileReader(fileName)); String s;
while((s = in.readLine()) != null) { sb.append(s); sb.append("\n"); } in.close(); strPage=sb.toString(); } public String getTitle(){ return ""; }
|