import java.io.*; import java.net.*; import java.awt.event.*; import java.util.*; import java.util.regex.*; public class Spider { public static Vector filelist = new Vector(); //a list of visited files, so we don't re-parse private static String inputFile = "http://google.com"; public static void main(String argv[]){ Vector uris = new Vector(); //this is a list of URIs to parse uris.add(inputFile); while (uris.size() > 0) { String url = (String) uris.remove(0); System.out.println(url); try { BufferedReader reader = new BufferedReader( new InputStreamReader( new URL(url).openStream())); String line = reader.readLine(); while (line != null) { Pattern p = Pattern.compile("http://[^\"\\s]+"); Matcher m = p.matcher(line); while ( m.find()) { System.out.println("\t"+line.substring(m.start(),m.end() )); uris.add(line.substring(m.start(),m.end() )); } line = reader.readLine(); } } catch (Exception e ) {System.out.println(e);} } } }