Added priority mechanism.
[utils] / crawler / basic / src / org / wamblee / crawler / impl / App.java
index 65c7f80250b8d1321e0711761cb063622b51362c..d4ca4709c78a19665736f93cdd4d543582d6942f 100644 (file)
@@ -2,13 +2,9 @@ package org.wamblee.crawler.impl;
 
 import java.io.File;
 import java.io.FileInputStream;
-import java.io.FileOutputStream;
 import java.io.InputStream;
-import java.io.PrintStream;
 
 import org.apache.commons.httpclient.HttpClient;
-import org.apache.commons.logging.Log;
-import org.apache.commons.logging.LogFactory;
 import org.dom4j.Element;
 import org.wamblee.crawler.Action;
 import org.wamblee.crawler.Configuration;
@@ -33,57 +29,52 @@ import org.wamblee.crawler.PageException;
  */
 
 /**
- * Entry point for the crawler.
+ * Test application which uses the crawler. 
  */
 public final class App {
-    
+
     /**
      * Disabled constructor.
-     *
+     * 
      */
-    private App() { 
+    private App() {
         // Empty
     }
-
-    private static final Log LOG = LogFactory.getLog(App.class);
-
-    private static final String LOG_FILE = "crawler.log";
-
+    
+    /**
+     * Runs a test program.
+     * 
+     * @param aArgs
+     *            Arguments. First argument is the crawler config file name and
+     *            second argument is the start url.
+     * @throws Exception
+     *             In case of problems.
+     */
     public static void main(String[] aArgs) throws Exception {
         String configFileName = aArgs[0];
         String starturl = aArgs[1];
 
-        FileOutputStream fos = new FileOutputStream(new File(LOG_FILE));
-        PrintStream os = new PrintStream(fos);
-
-        try {
-            ConfigurationParser parser = new ConfigurationParser(os);
-            InputStream configFile = new FileInputStream(new File(
-                    configFileName));
-            Configuration config = parser.parse(configFile);
-
-            HttpClient client = new HttpClient();
-            // client.getHostConfiguration().setProxy("localhost", 3128);
-
-            Crawler crawler = new CrawlerImpl(client, config);
-
-            System.out.println("Retrieving: " + starturl);
-            Page page = crawler.getPage(starturl);
-            showPage(page);
-            page = page.getAction("channels-favorites").execute();
-            recordInterestingShows(page);
-            showPage(page);
-            page = page.getAction("Nederland 1").execute();
-            showPage(page);
-            page = page.getAction("right-now").execute();
-            showPage(page);
-            page = page.getAction("Het elfde uur").execute();
-            showPage(page);
-        } finally {
-            os.flush();
-            os.close();
-            System.out.println("Output written on '" + LOG_FILE + "'");
-        }
+        ConfigurationParser parser = new ConfigurationParser();
+        InputStream configFile = new FileInputStream(new File(configFileName));
+        Configuration config = parser.parse(configFile);
+
+        HttpClient client = new HttpClient();
+        // client.getHostConfiguration().setProxy("localhost", 3128);
+
+        Crawler crawler = new CrawlerImpl(client, config);
+
+        System.out.println("Retrieving: " + starturl);
+        Page page = crawler.getPage(starturl);
+        showPage(page);
+        page = page.getAction("channels-favorites").execute();
+        recordInterestingShows(page);
+        showPage(page);
+        page = page.getAction("Nederland 1").execute();
+        showPage(page);
+        page = page.getAction("right-now").execute();
+        showPage(page);
+        page = page.getAction("Het elfde uur").execute();
+        showPage(page);
     }
 
     /**
@@ -107,7 +98,8 @@ public final class App {
         }
     }
 
-    private static void examineChannel(String aChannel, Page aPage) throws PageException {
+    private static void examineChannel(String aChannel, Page aPage)
+            throws PageException {
         Action[] programs = aPage.getActions();
         for (Action program : programs) {
             System.out.println(aChannel + " - " + program.getName());