X-Git-Url: http://wamblee.org/gitweb/?a=blobdiff_plain;f=crawler%2Fkiss%2Fsrc%2Forg%2Fwamblee%2Fcrawler%2Fkiss%2FProgramConfigurationParser.java;h=e9ba272e3ec33fe25497c6637d87974af91075f8;hb=8baad2389febcbcd9132fbb62e6329247275a000;hp=71719799c2162296902da68e8f6c7612382fc5b0;hpb=33225df8dfc5d87809fd0923b585c74245ad26b8;p=utils diff --git a/crawler/kiss/src/org/wamblee/crawler/kiss/ProgramConfigurationParser.java b/crawler/kiss/src/org/wamblee/crawler/kiss/ProgramConfigurationParser.java index 71719799..e9ba272e 100644 --- a/crawler/kiss/src/org/wamblee/crawler/kiss/ProgramConfigurationParser.java +++ b/crawler/kiss/src/org/wamblee/crawler/kiss/ProgramConfigurationParser.java @@ -21,21 +21,29 @@ import java.util.ArrayList; import java.util.Iterator; import java.util.List; +import org.dom4j.Attribute; import org.dom4j.Document; import org.dom4j.DocumentException; import org.dom4j.Element; import org.dom4j.io.SAXReader; +import org.wamblee.conditions.AndCondition; import org.wamblee.conditions.Condition; -import org.wamblee.conditions.OrCondition; +import org.wamblee.conditions.PropertyRegexCondition; /** * Parse the configuration of desired programs. */ -public class ProgramConfigurationParser { - - +class ProgramConfigurationParser { + private static final String ELEM_PROGRAM = "program"; - private static final String ELEM_PATTERN = "name"; + + private static final String ELEM_PATTERN = "match"; + + private static final String ELEM_ACTION = "action"; + + private static final String ELEM_CATEGORY = "category"; + + private static final String ACTION_NOTIFY = "notify"; /** * Parses the condition used to match the desired programs. @@ -44,20 +52,48 @@ public class ProgramConfigurationParser { * Input stream to parse from. * @return Condition. */ - Condition parse(InputStream aStream) { + List parse(InputStream aStream) { + List filters = new ArrayList(); try { SAXReader reader = new SAXReader(); Document document = reader.read(aStream); Element root = document.getRootElement(); - List> conditions = new ArrayList>(); - for (Iterator i = root.elementIterator(ELEM_PROGRAM); i.hasNext(); ) { - Element program = (Element)i.next(); - String pattern = ".*" + program.element(ELEM_PATTERN).getText() + ".*"; - conditions.add(new ProgramNameMatcher(pattern)); + for (Iterator i = root.elementIterator(ELEM_PROGRAM); i.hasNext();) { + Element program = (Element) i.next(); + + Element categoryElem = program.element(ELEM_CATEGORY); + String category = ""; + if ( categoryElem != null ) { + category = categoryElem.getText().trim(); + } + + Element actionElem = program.element(ELEM_ACTION); + ProgramAction action = new RecordProgramAction(); + if (actionElem != null) { + if (actionElem.getText().equals(ACTION_NOTIFY)) { + action = new InterestingProgramAction(category); + } + } + + List> regexConditions = + new ArrayList>(); + for (Iterator j = program.elementIterator(ELEM_PATTERN); j.hasNext(); ) { + Element patternElem = (Element)j.next(); + String fieldName = "name"; + Attribute fieldAttribute = patternElem.attribute("field"); + if ( fieldAttribute != null ) { + fieldName = fieldAttribute.getText(); + } + String pattern = ".*(" + patternElem.getText() + + ").*"; + regexConditions.add(new PropertyRegexCondition(fieldName, pattern, true)); + } + Condition condition = new AndCondition(regexConditions); + filters.add(new ProgramFilter(condition, action)); } - return new OrCondition(conditions); + return filters; } catch (DocumentException e) { throw new RuntimeException("Error parsing program configuraiton", e); }