home *** CD-ROM | disk | FTP | other *** search
- import java.net.URL;
- import java.util.Enumeration;
- import java.util.Properties;
-
- class SearchEngineSpider {
- URL home;
- String homes;
- Properties done;
- Properties todo;
-
- SearchEngineSpider(URL var1, String var2) {
- this.home = var1;
- this.done = new Properties();
- this.todo = new Properties();
- this.homes = var1.toString();
- this.follow(var1, var2);
- }
-
- public void follow(URL var1, String var2) {
- int var3 = var2.lastIndexOf(35);
- if (var3 >= 0) {
- var2 = var2.substring(0, var3);
- }
-
- try {
- URL var4 = new URL(var1, var2);
- String var5 = var4.toString();
- if (this.done.get(var5) == null) {
- this.todo.put(var5, "");
- return;
- }
- } catch (Exception var6) {
- }
-
- }
-
- void run(SearchEngineGenerator var1) {
- Enumeration var2;
- while((var2 = this.todo.keys()).hasMoreElements()) {
- String var3 = (String)var2.nextElement();
- this.todo.remove(var3);
- this.done.put(var3, "");
-
- try {
- URL var4 = new URL(var3);
- String var5 = var4.toString();
- String var6 = var5.toUpperCase();
- if (!var5.startsWith(this.homes)) {
- System.out.println("Ignoriere externen Link " + var5);
- } else if (!var6.endsWith("/") && !var6.endsWith(".HTM") && !var6.endsWith(".TXT") && !var6.endsWith(".HTML") && !var6.endsWith(".SHTML")) {
- System.out.println("Ignoriere Link mit unbekannter Erweiterung: " + var5);
- } else {
- System.out.println("Indiziere " + var5);
- DocumentParser var7 = new DocumentParser(var1, var4.openStream(), this, var4);
- var7.parse(var3.substring(this.homes.length()));
- }
- } catch (Exception var8) {
- System.err.println("Exception: " + ((Throwable)var8).getMessage());
- }
- }
-
- }
- }
-