X-Git-Url: http://wamblee.org/gitweb/?a=blobdiff_plain;f=crawler%2Fkiss%2Fsrc%2Forg%2Fwamblee%2Fcrawler%2Fkiss%2Fmain%2FKissCrawler.java;h=5125f407d45094b4bc71698ef47c5fe375691ed0;hb=fe5539c3fc40659242cac7b2954a04101ba94504;hp=a9a8097a7ae038a92bda4ded8d158592bedcdc6a;hpb=fcb3fcbfe75c778711c2f91b66d0a905562379f9;p=utils diff --git a/crawler/kiss/src/org/wamblee/crawler/kiss/main/KissCrawler.java b/crawler/kiss/src/org/wamblee/crawler/kiss/main/KissCrawler.java index a9a8097a..5125f407 100644 --- a/crawler/kiss/src/org/wamblee/crawler/kiss/main/KissCrawler.java +++ b/crawler/kiss/src/org/wamblee/crawler/kiss/main/KissCrawler.java @@ -46,6 +46,7 @@ import org.wamblee.crawler.kiss.guide.Time; import org.wamblee.crawler.kiss.guide.TimeInterval; import org.wamblee.crawler.kiss.notification.NotificationException; import org.wamblee.crawler.kiss.notification.Notifier; +import org.wamblee.general.BeanFactory; import org.wamblee.xml.ClasspathUriResolver; import org.wamblee.xml.XslTransformer; @@ -65,7 +66,7 @@ public class KissCrawler { /** * Default socket timeout to use. */ - private static final int SOCKET_TIMEOUT = 20000; + private static final int SOCKET_TIMEOUT = 10000; /** * Regular expression for matching time interval strings in the retrieved @@ -89,7 +90,10 @@ public class KissCrawler { public static void main(String[] aArgs) throws Exception { String crawlerConfig = new File(aArgs[0]).getCanonicalPath(); String programConfig = new File(aArgs[1]).getCanonicalPath(); - new KissCrawler(START_URL, SOCKET_TIMEOUT, crawlerConfig, programConfig); + + BeanFactory factory = new StandaloneCrawlerBeanFactory(); + Notifier notifier = factory.find(Notifier.class); + new KissCrawler(START_URL, SOCKET_TIMEOUT, crawlerConfig, programConfig, notifier, new Report()); } /** @@ -101,14 +105,16 @@ public class KissCrawler { * Configuration file for the crawler. * @param aProgramConfig * Configuration file describing interesting shows. + * @param aNotifier Object used to send notifications of the results. + * @param aReport Report to use. * @throws IOException * In case of problems reading files. - * @throws MessagingException - * In case of problems sending a mail notification. + * @throws NotificationException In case notification fails. + * @throws PageException In case of problems retrieving the TV guide. */ public KissCrawler(String aCrawlerConfig, - String aProgramConfig) throws IOException, NotificationException { - this(START_URL, SOCKET_TIMEOUT, aCrawlerConfig, aProgramConfig); + String aProgramConfig, Notifier aNotifier, Report aReport) throws IOException, NotificationException, PageException { + this(START_URL, SOCKET_TIMEOUT, aCrawlerConfig, aProgramConfig, aNotifier, aReport); } @@ -124,13 +130,15 @@ public class KissCrawler { * Configuration file for the crawler. * @param aProgramConfig * Configuration file describing interesting shows. + * @param aNotifier Object used to send notifications of the results. + * @param aReport Report to use. * @throws IOException * In case of problems reading files. - * @throws MessagingException - * In case of problems sending a mail notification. + * @throws NotificationException In case notification fails. + * @throws PageException In case of problems retrieving the TV guide. */ public KissCrawler(String aStartUrl, int aSocketTimeout, String aCrawlerConfig, - String aProgramConfig) throws IOException, NotificationException { + String aProgramConfig, Notifier aNotifier, Report aReport) throws IOException, NotificationException, PageException { _pattern = Pattern.compile(TIME_REGEX); @@ -145,25 +153,23 @@ public class KissCrawler { Crawler crawler = createCrawler(aCrawlerConfig, client, transformer); InputStream programConfigFile = new FileInputStream(new File( aProgramConfig)); - ProgramConfigurationParser parser = new ProgramConfigurationParser( - transformer); + ProgramConfigurationParser parser = new ProgramConfigurationParser(); parser.parse(programConfigFile); List programFilters = parser.getFilters(); - Report report = new Report(); - try { - Page page = getStartPage(aStartUrl, crawler, report); - TVGuide guide = createGuide(page, report); + Page page = getStartPage(aStartUrl, crawler, aReport); + TVGuide guide = createGuide(page, aReport); PrintVisitor printer = new PrintVisitor(System.out); guide.accept(printer); - processResults(programFilters, guide, parser.getNotifier(), - report); + processResults(programFilters, guide, aNotifier, + aReport); } catch (PageException e) { - report.addMessage("Problem getting TV guide", e); + aReport.addMessage("Problem getting TV guide", e); LOG.info("Problem getting TV guide", e); + throw e; } - parser.getNotifier().send(report.asXml()); + aNotifier.send(aReport.asXml()); } finally { System.out.println("Crawler finished"); } @@ -252,10 +258,15 @@ public class KissCrawler { * @param aReport * Report to use. * @return TV guide. + * @throws PageException In case of problem getting the tv guide. */ - private TVGuide createGuide(Page aPage, Report aReport) { + private TVGuide createGuide(Page aPage, Report aReport) throws PageException { LOG.info("Obtaining full TV guide"); Action[] actions = aPage.getActions(); + if ( actions.length == 0 ) { + LOG.error("No channels found"); + throw new PageException("No channels found"); + } List channels = new ArrayList(); for (Action action : actions) { try {